mirror of
https://github.com/JoergFranke/ADNC.git
synced 2024-11-17 13:58:03 +08:00
add cnn model
This commit is contained in:
parent
9d9bfd8f75
commit
f8df19541b
55
experiments/pre_trained/cnn_rc_task/adnc/config.yml
Normal file
55
experiments/pre_trained/cnn_rc_task/adnc/config.yml
Normal file
@ -0,0 +1,55 @@
|
|||||||
|
#######################################
|
||||||
|
### Global Configuration ###
|
||||||
|
#######################################
|
||||||
|
|
||||||
|
global:
|
||||||
|
batch_size: &batch_size 32
|
||||||
|
|
||||||
|
#######################################
|
||||||
|
### Training Configuration ###
|
||||||
|
#######################################
|
||||||
|
training:
|
||||||
|
epochs: 8
|
||||||
|
learn_rate: 0.00003
|
||||||
|
optimizer: 'rmsprop'
|
||||||
|
optimizer_config: {'momentum':0.9}
|
||||||
|
gradient_clipping: 5
|
||||||
|
weight_decay: False
|
||||||
|
|
||||||
|
|
||||||
|
#######################################
|
||||||
|
### MANN Configuration ###
|
||||||
|
#######################################
|
||||||
|
mann:
|
||||||
|
name: 'mann1'
|
||||||
|
seed: 25
|
||||||
|
input_size: 0
|
||||||
|
output_size: 0
|
||||||
|
batch_size: *batch_size
|
||||||
|
input_embedding: True
|
||||||
|
architecture: 'uni'
|
||||||
|
controller_config: {"num_units":[512], "layer_norm":True, "activation":'tanh', 'cell_type':'clstm', 'connect':'sparse', 'attention':False}
|
||||||
|
memory_unit_config: {"cell_type":'cmu', "memory_length":192, "memory_width":128, "read_heads":4, "write_heads": 1, "layer_norm":True, "bypass_dropout":0.9}
|
||||||
|
output_function: "softmax"
|
||||||
|
output_mask: True
|
||||||
|
loss_function: 'cross_entropy'
|
||||||
|
|
||||||
|
|
||||||
|
###################################################################
|
||||||
|
####### CNN Daily Mail RC ######
|
||||||
|
###################################################################
|
||||||
|
cnn:
|
||||||
|
data_set: 'cnn'
|
||||||
|
|
||||||
|
# data_dir: 'data_cnn'
|
||||||
|
# tmp_dir: 'data_tmp'
|
||||||
|
|
||||||
|
seed: 315
|
||||||
|
batch_size: *batch_size
|
||||||
|
max_len: 1400
|
||||||
|
|
||||||
|
answer_first: False
|
||||||
|
num_chached: 5
|
||||||
|
threads: 1
|
||||||
|
|
||||||
|
|
@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:7702dd0680280543ac27340f70e38405891d5b783861f98f7244c0b552b0ccb5
|
||||||
|
size 98847904
|
@ -0,0 +1,3 @@
|
|||||||
|
version https://git-lfs.github.com/spec/v1
|
||||||
|
oid sha256:14a929e0d3991197dbcf6a3b02951a2ba0d21de94af8278517c42058343c929a
|
||||||
|
size 1593
|
BIN
experiments/pre_trained/cnn_rc_task/adnc/word_idx_dict.pkl
Normal file
BIN
experiments/pre_trained/cnn_rc_task/adnc/word_idx_dict.pkl
Normal file
Binary file not shown.
Loading…
Reference in New Issue
Block a user