config.yaml 2.5 KB
Newer Older
M
add gnn  
malin10 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

M
malin10 已提交
15
# workspace
C
Chengmo 已提交
16
workspace: "models/recall/gnn"
M
add gnn  
malin10 已提交
17

M
malin10 已提交
18 19 20
# list of dataset
dataset:
- name: dataset_train # name of dataset to distinguish different datasets
C
Chengmo 已提交
21
  batch_size: 10
M
malin10 已提交
22 23 24 25 26 27 28 29
  type: DataLoader # or QueueDataset
  data_path: "{workspace}/data/train"
  data_converter: "{workspace}/reader.py"
- name: dataset_infer # name
  batch_size: 50
  type: DataLoader # or QueueDataset
  data_path: "{workspace}/data/test"
  data_converter: "{workspace}/evaluate_reader.py"
M
add gnn  
malin10 已提交
30

M
malin10 已提交
31 32 33 34 35 36 37 38
# hyper parameters of user-defined network
hyper_parameters:
  optimizer:
    class: Adam
    learning_rate: 0.001
    decay_steps: 3
    decay_rate: 0.1
    l2: 0.00001
M
malin10 已提交
39
  sparse_feature_number: 43098
M
malin10 已提交
40 41 42
  sparse_feature_dim: 100
  corpus_size: 719470
  gnn_propogation_steps: 1
M
add gnn  
malin10 已提交
43

M
malin10 已提交
44
# select runner by name
M
bug fix  
malin10 已提交
45
mode: [single_cpu_train, single_cpu_infer]
M
malin10 已提交
46 47 48
# config of each runner.
# runner is a kind of paddle training class, which wraps the train/infer process.
runner:
M
bug fix  
malin10 已提交
49
- name: single_cpu_train
J
Jinhua Liang 已提交
50
  class: train
M
malin10 已提交
51
  # num of epochs
M
bug fix  
malin10 已提交
52
  epochs: 5
M
malin10 已提交
53 54 55 56
  # device to run training or infer
  device: cpu
  save_checkpoint_interval: 1 # save model interval of epochs
  save_inference_interval: 1 # save inference
M
gnn  
malin10 已提交
57 58
  save_checkpoint_path: "increment_gnn" # save checkpoint path
  save_inference_path: "inference_gnn" # save inference path
M
malin10 已提交
59 60 61
  save_inference_feed_varnames: [] # feed vars of save inference
  save_inference_fetch_varnames: [] # fetch vars of save inference
  init_model_path: "" # load model path
M
malin10 已提交
62
  print_interval: 1
M
gnn  
malin10 已提交
63
  phases: [phase1]
M
bug fix  
malin10 已提交
64
- name: single_cpu_infer
C
Chengmo 已提交
65
  class: infer
M
malin10 已提交
66 67
  # device to run training or infer
  device: cpu
C
Chengmo 已提交
68
  print_interval: 1
M
gnn  
malin10 已提交
69 70
  init_model_path: "increment_gnn" # load model path
  phases: [phase2]
M
add gnn  
malin10 已提交
71

M
malin10 已提交
72 73
# runner will run all the phase in each epoch
phase:
M
malin10 已提交
74
- name: phase1
M
malin10 已提交
75 76 77
  model: "{workspace}/model.py" # user-defined model
  dataset_name: dataset_train # select dataset by name
  thread_num: 1
M
gnn  
malin10 已提交
78 79 80 81
- name: phase2
  model: "{workspace}/model.py" # user-defined model
  dataset_name: dataset_infer # select dataset by name
  thread_num: 1