# Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. config = { #========== remote config ========== 'server_ip': 'localhost', 'server_port': 8037, #========== env config ========== 'env_name': 'PongNoFrameskip-v4', 'env_dim': 42, #========== learner config ========== 'train_batch_size': 128, 'max_predict_batch_size': 16, 'predict_thread_num': 2, 't_max': 5, 'gamma': 0.99, 'lambda': 1.0, # GAE # learning rate adjustment schedule: (train_step, learning_rate) 'lr_scheduler': [(0, 0.0005), (100000, 0.0003), (200000, 0.0001)], # coefficient of policy entropy adjustment schedule: (train_step, coefficient) 'entropy_coeff_scheduler': [(0, -0.01)], 'vf_loss_coeff': 0.5, 'log_metrics_interval_s': 10, }