mirror of
https://github.com/JoergFranke/ADNC.git
synced 2024-11-17 13:58:03 +08:00
56 lines
1.6 KiB
YAML
56 lines
1.6 KiB
YAML
#######################################
|
|
### Global Configuration ###
|
|
#######################################
|
|
|
|
global:
|
|
batch_size: &batch_size 32
|
|
|
|
#######################################
|
|
### Training Configuration ###
|
|
#######################################
|
|
training:
|
|
epochs: 8
|
|
learn_rate: 0.00003
|
|
optimizer: 'rmsprop'
|
|
optimizer_config: {'momentum':0.9}
|
|
gradient_clipping: 5
|
|
weight_decay: False
|
|
|
|
|
|
#######################################
|
|
### MANN Configuration ###
|
|
#######################################
|
|
mann:
|
|
name: 'mann1'
|
|
seed: 25
|
|
input_size: 0
|
|
output_size: 0
|
|
batch_size: *batch_size
|
|
input_embedding: True
|
|
architecture: 'uni'
|
|
controller_config: {"num_units":[512], "layer_norm":True, "activation":'tanh', 'cell_type':'clstm', 'connect':'sparse', 'attention':False}
|
|
memory_unit_config: {"cell_type":'cmu', "memory_length":192, "memory_width":128, "read_heads":4, "write_heads": 1, "dnc_norm":True, "bypass_dropout":0.9}
|
|
output_function: "softmax"
|
|
output_mask: True
|
|
loss_function: 'cross_entropy'
|
|
|
|
|
|
###################################################################
|
|
####### CNN Daily Mail RC ######
|
|
###################################################################
|
|
cnn:
|
|
data_set: 'cnn'
|
|
|
|
# data_dir: 'data_cnn'
|
|
# tmp_dir: 'data_tmp'
|
|
|
|
seed: 315
|
|
batch_size: *batch_size
|
|
max_len: 1400
|
|
|
|
answer_first: False
|
|
num_chached: 5
|
|
threads: 1
|
|
|
|
|