add cnn model

This commit is contained in:
Joerg Franke 2018-07-04 23:59:51 +02:00
parent 9d9bfd8f75
commit f8df19541b
4 changed files with 61 additions and 0 deletions

View File

@ -0,0 +1,55 @@
#######################################
### Global Configuration ###
#######################################
global:
batch_size: &batch_size 32
#######################################
### Training Configuration ###
#######################################
training:
epochs: 8
learn_rate: 0.00003
optimizer: 'rmsprop'
optimizer_config: {'momentum':0.9}
gradient_clipping: 5
weight_decay: False
#######################################
### MANN Configuration ###
#######################################
mann:
name: 'mann1'
seed: 25
input_size: 0
output_size: 0
batch_size: *batch_size
input_embedding: True
architecture: 'uni'
controller_config: {"num_units":[512], "layer_norm":True, "activation":'tanh', 'cell_type':'clstm', 'connect':'sparse', 'attention':False}
memory_unit_config: {"cell_type":'cmu', "memory_length":192, "memory_width":128, "read_heads":4, "write_heads": 1, "layer_norm":True, "bypass_dropout":0.9}
output_function: "softmax"
output_mask: True
loss_function: 'cross_entropy'
###################################################################
####### CNN Daily Mail RC ######
###################################################################
cnn:
data_set: 'cnn'
# data_dir: 'data_cnn'
# tmp_dir: 'data_tmp'
seed: 315
batch_size: *batch_size
max_len: 1400
answer_first: False
num_chached: 5
threads: 1

View File

@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:7702dd0680280543ac27340f70e38405891d5b783861f98f7244c0b552b0ccb5
size 98847904

View File

@ -0,0 +1,3 @@
version https://git-lfs.github.com/spec/v1
oid sha256:14a929e0d3991197dbcf6a3b02951a2ba0d21de94af8278517c42058343c929a
size 1593