diff options
author | Alex Auvolat <alex.auvolat@ens.fr> | 2015-05-04 13:15:42 -0400 |
---|---|---|
committer | Alex Auvolat <alex.auvolat@ens.fr> | 2015-05-04 13:15:42 -0400 |
commit | 9adfe767010e23823089b4db94cb4dc53cc3c12a (patch) | |
tree | adaa2d3a72080208e5267dbd8e0b238f06d8f88f /convert_data.py | |
parent | 71bb4d90da2bad933fdca48d1879886fe7aa9bc8 (diff) | |
parent | a042000073bf348fddff23f41d30f49f2e874adb (diff) | |
download | taxi-9adfe767010e23823089b4db94cb4dc53cc3c12a.tar.gz taxi-9adfe767010e23823089b4db94cb4dc53cc3c12a.zip |
Merge branch 'master' of github.com:adbrebs/taxi
Diffstat (limited to 'convert_data.py')
-rwxr-xr-x | convert_data.py | 3 |
1 files changed, 2 insertions, 1 deletions
diff --git a/convert_data.py b/convert_data.py index f81b40f..9684fa9 100755 --- a/convert_data.py +++ b/convert_data.py @@ -104,8 +104,9 @@ def convert(input_directory, save_path): h5file = h5py.File(save_path, 'w') split = {} split.update(read_stands(input_directory, h5file)) - split.update(read_taxis(input_directory, h5file, 'test', 'test_')) split.update(read_taxis(input_directory, h5file, 'train', '')) + print 'First origin_call not present in training set: ', len(origin_call_dict) + split.update(read_taxis(input_directory, h5file, 'test', 'test_')) split.update(unique(h5file)) h5file.attrs['split'] = H5PYDataset.create_split_array(split) h5file.flush() |