Refactor models, clean the code and separate training from testing.

author: Étienne Simon <esimon@esimon.eu> 2015-05-18 16:22:00 -0400
committer: Étienne Simon <esimon@esimon.eu> 2015-05-18 16:22:00 -0400
commit: 6d946f29f7548c75e97f30c4356dbac200ee6cce (patch)
tree: 387e586c7ad0c1a0167d21451c9a8c877cf3ef0e /model/time_simple_mlp_tgtcls.py
parent: 1e6d08b0c9ac5983691b182631c71e9d46ee71cc (diff)
download: taxi-6d946f29f7548c75e97f30c4356dbac200ee6cce.tar.gz
taxi-6d946f29f7548c75e97f30c4356dbac200ee6cce.zip
1 files changed, 22 insertions, 56 deletions
diff --git a/model/time_simple_mlp_tgtcls.py b/model/time_simple_mlp_tgtcls.py
index 1f1eab7..35c8d8a 100644
--- a/model/time_simple_mlp_tgtcls.py
+++ b/model/time_simple_mlp_tgtcls.py
@@ -1,67 +1,33 @@
-from blocks.bricks import MLP, Rectifier, Linear, Sigmoid, Identity, Softmax
-from blocks.bricks.lookup import LookupTable
-
 import numpy
 import theano
 from theano import tensor
+from blocks.bricks import application, Softmax
 
-import data
 import error
+from model.mlp import FFMLP, Stream
 
-class Model(object):
-    def __init__(self, config):
-        # The input and the targets
-        x_firstk_latitude = (tensor.matrix('first_k_latitude') - data.train_gps_mean[0]) / data.train_gps_std[0]
-        x_firstk_longitude = (tensor.matrix('first_k_longitude') - data.train_gps_mean[1]) / data.train_gps_std[1]
-
-        x_lastk_latitude = (tensor.matrix('last_k_latitude') - data.train_gps_mean[0]) / data.train_gps_std[0]
-        x_lastk_longitude = (tensor.matrix('last_k_longitude') - data.train_gps_mean[1]) / data.train_gps_std[1]
-
-        input_list = [x_firstk_latitude, x_firstk_longitude, x_lastk_latitude, x_lastk_longitude]
-        embed_tables = []
-
-        self.require_inputs = ['first_k_latitude', 'first_k_longitude', 'last_k_latitude', 'last_k_longitude']
-
-        for (varname, num, dim) in config.dim_embeddings:
-            self.require_inputs.append(varname)
-            vardata = tensor.lvector(varname)
-            tbl = LookupTable(length=num, dim=dim, name='%s_lookup'%varname)
-            embed_tables.append(tbl)
-            input_list.append(tbl.apply(vardata))
-
-        y = tensor.lvector('travel_time')
-
-        # Define the model
-        mlp = MLP(activations=[Rectifier() for _ in config.dim_hidden] + [Softmax()],
-                           dims=[config.dim_input] + config.dim_hidden + [config.dim_output])
-        classes = theano.shared(numpy.array(config.tgtcls, dtype=theano.config.floatX), name='classes')
-
-        # Create the Theano variables
-        inputs = tensor.concatenate(input_list, axis=1)
-        # inputs = theano.printing.Print("inputs")(inputs)
-        cls_probas = mlp.apply(inputs)
-        outputs = tensor.dot(cls_probas, classes)
-
-        # outputs = theano.printing.Print("outputs")(outputs)
-        # y = theano.printing.Print("y")(y)
 
-        outputs.name = 'outputs'
+class Model(FFMLP):
+    def __init__(self, config, **kwargs):
+        super(Model, self, output_layer=Softmax).__init__(config, **kwargs)
+        self.classes = theano.shared(numpy.array(config.tgtcls, dtype=theano.config.floatX), name='classes')
+        self.inputs.append('input_time')
 
-        # Calculate the cost
-        cost = error.rmsle(outputs.flatten(), y.flatten())
-        cost.name = 'cost'
+    @application(outputs=['duration'])
+    def predict(self, **kwargs):
+        cls_probas = super(Model, self).predict(**kwargs)
+        return kwargs['input_time'] + tensor.dot(cls_probas, self.classes)
 
-        # Initialization
-        for tbl in embed_tables:
-            tbl.weights_init = config.embed_weights_init
-        mlp.weights_init = config.mlp_weights_init
-        mlp.biases_init = config.mlp_biases_init
+    @predict.property('inputs')
+    def predict_inputs(self):
+        return self.inputs
 
-        for tbl in embed_tables:
-            tbl.initialize()
-        mlp.initialize()
+    @application(outputs=['cost'])
+    def cost(self, **kwargs):
+        y_hat = self.predict(**kwargs)
+        y = kwargs['travel_time']
+        return error.rmsle(y_hat.flatten(), y.flatten())
 
-        self.cost = cost
-        self.monitor = [cost]
-        self.outputs = outputs
-        self.pred_vars = ['travel_time']
+    @cost.property('inputs')
+    def cost_inputs(self):
+        return self.inputs + ['travel_time']
author	Étienne Simon <esimon@esimon.eu>	2015-05-18 16:22:00 -0400
committer	Étienne Simon <esimon@esimon.eu>	2015-05-18 16:22:00 -0400
commit	6d946f29f7548c75e97f30c4356dbac200ee6cce (patch)
tree	387e586c7ad0c1a0167d21451c9a8c877cf3ef0e /model/time_simple_mlp_tgtcls.py
parent	1e6d08b0c9ac5983691b182631c71e9d46ee71cc (diff)
download	taxi-6d946f29f7548c75e97f30c4356dbac200ee6cce.tar.gz taxi-6d946f29f7548c75e97f30c4356dbac200ee6cce.zip