From f31caf61be87850f3afcd367d6eb9521b2f613da Mon Sep 17 00:00:00 2001 From: Thomas Mesnard Date: Tue, 1 Mar 2016 00:27:15 +0100 Subject: Initial commit --- config/deepmind_attentive_reader.py | 42 +++++++++++++++++++++++++++++++++++++ 1 file changed, 42 insertions(+) create mode 100644 config/deepmind_attentive_reader.py (limited to 'config/deepmind_attentive_reader.py') diff --git a/config/deepmind_attentive_reader.py b/config/deepmind_attentive_reader.py new file mode 100644 index 0000000..84a6cf0 --- /dev/null +++ b/config/deepmind_attentive_reader.py @@ -0,0 +1,42 @@ +from blocks.bricks import Tanh +from blocks.algorithms import BasicMomentum, AdaDelta, RMSProp, Adam, CompositeRule, StepClipping, Momentum +from blocks.initialization import IsotropicGaussian, Constant + +from model.attentive_reader import Model + + +batch_size = 32 +sort_batch_count = 20 + +shuffle_questions = True + +concat_ctx_and_question = False + +n_entities = 550 +embed_size = 200 + +ctx_lstm_size = [256] +ctx_skip_connections = True + +question_lstm_size = [256] +question_skip_connections = True + +attention_mlp_hidden = [100] +attention_mlp_activations = [Tanh()] + +out_mlp_hidden = [] +out_mlp_activations = [] + +step_rule = CompositeRule([RMSProp(decay_rate=0.95, learning_rate=5e-5), + BasicMomentum(momentum=0.9)]) + +dropout = 0.2 +w_noise = 0. + +valid_freq = 1000 +save_freq = 1000 +print_freq = 100 + +weights_init = IsotropicGaussian(0.01) +biases_init = Constant(0.) + -- cgit v1.2.3