shuffle option
This commit is contained in:
parent
b8ac59d942
commit
294d4bb1cd
2
Makefile
2
Makefile
@ -2,7 +2,7 @@ all: install data train eval
|
|||||||
|
|
||||||
city_distances_full.csv: check generate_data.py
|
city_distances_full.csv: check generate_data.py
|
||||||
@echo "Generating distance data..."
|
@echo "Generating distance data..."
|
||||||
@bash -c 'time python generate_data.py --country US --workers 8 --chunk-size 8000'
|
@bash -c 'time python generate_data.py --country US --workers 8 --chunk-size 4200'
|
||||||
|
|
||||||
data: city_distances_full.csv
|
data: city_distances_full.csv
|
||||||
|
|
||||||
|
@ -34,6 +34,11 @@ parser.add_argument(
|
|||||||
type=str,
|
type=str,
|
||||||
default="city_distances_full.csv",
|
default="city_distances_full.csv",
|
||||||
)
|
)
|
||||||
|
parser.add_argument(
|
||||||
|
"--shuffle",
|
||||||
|
action="store_true",
|
||||||
|
help="Option to shuffle combinations list before iterating over it",
|
||||||
|
)
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
|
|
||||||
|
|
||||||
@ -116,7 +121,8 @@ def main():
|
|||||||
cities = list(us_cities.values())
|
cities = list(us_cities.values())
|
||||||
print(f"Num cities: {len(cities)}")
|
print(f"Num cities: {len(cities)}")
|
||||||
city_combinations = list(itertools.combinations(cities, 2))
|
city_combinations = list(itertools.combinations(cities, 2))
|
||||||
# np.random.shuffle(city_combinations) # will this help or hurt caching? 1.03it/s
|
if args.shuffle:
|
||||||
|
np.random.shuffle(city_combinations)
|
||||||
chunk_size = args.chunk_size
|
chunk_size = args.chunk_size
|
||||||
num_chunks = len(city_combinations) // chunk_size + 1
|
num_chunks = len(city_combinations) // chunk_size + 1
|
||||||
output_file = args.output_file
|
output_file = args.output_file
|
||||||
|
Loading…
Reference in New Issue
Block a user