blob: 853a04aebbddebbb2543dadc6260b0a28ad577f6 [file] [log] [blame]
[common]
# method can be one of the followings - train,predict,load
mode = train
#ex: gpu0,gpu1,gpu2,gpu3
context = gpu0
# checkpoint prefix, check point will be saved under checkpoints folder with prefix
prefix = test_fc
# when mode is load or predict, model will be loaded from the file name with model_file under checkpoints
model_file = test_fc-0001
batch_size = 2
# log will be saved by the log_filename
log_filename = test.log
# checkpoint set n to save checkpoints after n epoch
save_checkpoint_every_n_epoch = 1
save_checkpoint_every_n_batch = 1000
is_bi_graphemes = False
tensorboard_log_dir = tblog/libri_sample
# if random_seed is -1 then it gets random seed from timestamp
mx_random_seed = -1
random_seed = -1
[data]
train_json = ./Libri_sample.json
test_json = ./Libri_sample.json
val_json = ./Libri_sample.json
language = en
width = 161
height = 1
channel = 1
stride = 1
[arch]
channel_num = 32
conv_layer1_filter_dim = [11, 41]
conv_layer1_stride = [2, 2]
conv_layer2_filter_dim = [11, 21]
conv_layer2_stride = [1, 2]
num_rnn_layer = 3
num_hidden_rnn_list = [1760, 1760, 1760]
num_hidden_proj = 0
num_rear_fc_layers = 0
num_hidden_rear_fc_list = []
act_type_rear_fc_list = []
#network: lstm, bilstm, gru, bigru
rnn_type = bigru
#vanilla_lstm or fc_lstm (no effect when network_type is gru, bigru)
lstm_type = fc_lstm
is_batchnorm = True
[train]
num_epoch = 70
learning_rate = 0.005
# constant learning rate annealing by factor
learning_rate_annealing = 1.1
# supports only sgd and adam
optimizer = adam
# for sgd
momentum = 0.9
# set to 0 to disable gradient clipping
clip_gradient = 0
initializer = Xavier
init_scale = 2
factor_type = in
weight_decay = 0.00001
# show progress every nth batches
show_every = 1
save_optimizer_states = True
normalize_target_k = 2
# overwrite meta files(feats_mean,feats_std,unicode_en_baidu_bi_graphemes.csv)
overwrite_meta_files = True
enable_logging_train_metric = True
enable_logging_validation_metric = True
[load]
load_optimizer_states = True
is_start_from_batch = False