diff options
author | Alex Auvolat <alex.auvolat@ens.fr> | 2015-04-29 19:41:36 -0400 |
---|---|---|
committer | Alex Auvolat <alex.auvolat@ens.fr> | 2015-04-29 19:41:36 -0400 |
commit | 43e106e6630030dd34813295fe1d07bb86025402 (patch) | |
tree | c3a604d8d023e35532522a18da06e8c25dc251c6 /data.py | |
parent | 8b27690c8d77585f173412e5719787c48272674e (diff) | |
download | taxi-43e106e6630030dd34813295fe1d07bb86025402.tar.gz taxi-43e106e6630030dd34813295fe1d07bb86025402.zip |
Fix
Diffstat (limited to 'data.py')
-rw-r--r-- | data.py | 5 |
1 files changed, 3 insertions, 2 deletions
@@ -2,6 +2,7 @@ import ast, csv import socket import fuel import numpy +import h5py from enum import Enum from fuel.datasets import Dataset from fuel.streams import DataStream @@ -28,7 +29,7 @@ dataset_size = 1710670 def make_client_ids(): f = h5py.File(H5DATA_PATH, "r") - l = f['uniq_origin_call'] + l = f['unique_origin_call'] r = {} for i in range(l.shape[0]): r[l[i]] = i @@ -37,7 +38,7 @@ def make_client_ids(): client_ids = make_client_ids() def get_client_id(n): - if n in client_ids: + if n in client_ids and client_ids[n] <= n_train_clients: return client_ids[n] else: return 0 |