aboutsummaryrefslogtreecommitdiff
path: root/data.py
diff options
context:
space:
mode:
authorAlex Auvolat <alex.auvolat@ens.fr>2015-05-04 13:15:23 -0400
committerAlex Auvolat <alex.auvolat@ens.fr>2015-05-04 13:15:23 -0400
commitde76aae44b6c0cbe9ab42c7ae215c3ae9e4e4055 (patch)
tree09c09a12861f0f6826cd33e3b77eba9a07076c49 /data.py
parent43e106e6630030dd34813295fe1d07bb86025402 (diff)
downloadtaxi-de76aae44b6c0cbe9ab42c7ae215c3ae9e4e4055.tar.gz
taxi-de76aae44b6c0cbe9ab42c7ae215c3ae9e4e4055.zip
Add TaxiGenerateSplits
Diffstat (limited to 'data.py')
-rw-r--r--data.py10
1 files changed, 7 insertions, 3 deletions
diff --git a/data.py b/data.py
index 92aa062..730a9ab 100644
--- a/data.py
+++ b/data.py
@@ -164,21 +164,25 @@ taxi_columns = [
]
taxi_columns_valid = taxi_columns + [
- ("destination_longitude", lambda l: float(l[9])),
- ("destination_latitude", lambda l: float(l[10])),
+ ("destination_longitude", lambda l: numpy.float32(float(l[9]))),
+ ("destination_latitude", lambda l: numpy.float32(float(l[10]))),
("time", lambda l: int(l[11])),
]
train_files=["%s/split/train-%02d.csv" % (DATA_PATH, i) for i in range(100)]
-valid_files=["%s/split/valid.csv" % (DATA_PATH,)]
+valid_files=["%s/split/valid2-cut.csv" % (DATA_PATH,)]
test_file="%s/test.csv" % (DATA_PATH,)
train_data=TaxiData(train_files, taxi_columns)
valid_data = TaxiData(valid_files, taxi_columns_valid)
test_data = TaxiData(test_file, taxi_columns, has_header=True)
+valid_trips = [l for l in open(DATA_PATH + "/split/valid2-cut-ids.txt")]
+
def train_it():
return DataIterator(DataStream(train_data))
def test_it():
return DataIterator(DataStream(valid_data))
+
+