config.py

import os

################## for building word dictionary  ##################

max_word_num = 51200 - 2
cutoff_word_fre = 0

################## for training task  #########################
# path of training data
train_file = "data/train_data_examples.txt"
# path of testing data, if testing file does not exist,
# testing will not be performed at the end of each training pass
test_file = ""
# path of word dictionary, if this file does not exist,
# word dictionary will be built from training data.
vocab_file = "data/word_vocab.txt"
# directory to save the trained model
# create a new directory if the directoy does not exist
model_save_dir = "models"

batch_size = 32  # the number of training examples in one forward/backward pass
num_passes = 20  # how many passes to train the model

log_period = 50
save_period_by_batches = 50

use_gpu = False  # to use gpu or not
trainer_count = 1  # number of trainer

##################  for model configuration  ##################
rnn_type = "lstm"  # "gru" or "lstm"
emb_dim = 256
hidden_size = 256
stacked_rnn_num = 2

##################  for text generation  ##################
gen_file = "data/train_data_examples.txt"
gen_result = "data/gen_result.txt"
max_gen_len = 25  # the max number of words to generate
beam_size = 5
model_path = "models/rnn_lm_pass_00000.tar.gz"

if not os.path.exists(model_save_dir):
    os.mkdir(model_save_dir)