with h5py.File(os.path.join(args.data, f'{args.city_name}.h5'), "w") as f:
f.attrs['num'] = len(routes_valid)
f.create_group('/trips/coord')
f.create_group('/trips/osmid')
f.create_group('/trips/length')
for i in range(len(routes_length)):
f.create_dataset(f'/trips/coord/{i + 1}', data=np.array(routes_coord[i]))
f.create_dataset(f'/trips/osmid/{i + 1}', data=np.array(routes_valid[i]))
f.create_dataset(f'/trips/length/{i + 1}', data=np.array(routes_length[i]))
i % 5_0000 == 0 and print_time(f'saved {i} trips')
大约有 150w 条数据,后面速度变得巨慢无比。

加入之后:

